Use unicode-data instead of downloading external files
authorPeter Colberg <peter@colberg.org>
Wed, 3 Sep 2025 11:15:04 +0000 (13:15 +0200)
committerMatthias Geiger <werdahias@debian.org>
Wed, 3 Sep 2025 11:15:04 +0000 (13:15 +0200)
Forwarded: not-needed
Last-Update: 2025-09-01

Replace external links with copies of Unicode data and GNU Unifont
provided by the packages unicode-data and ttf-unifont, respectively.
Last-Update: 2025-09-01
Gbp-Pq: Name use-unicode-data.patch

data/Makefile

index aa2d8a7331ca0f4113e57ba67cd4867e3197330a..24d09ac1bbc79c6bfbc98638b16683808a132719 100644 (file)
@@ -24,37 +24,37 @@ utf8proc_data.c.new: data_generator.jl $(RAWDATA)
 UNICODE_VERSION=16.0.0
 
 UnicodeData.txt:
-       $(CURL) $(CURLFLAGS) -o $@ https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/UnicodeData.txt
+       cp /usr/share/unicode/UnicodeData.txt $@
 
 EastAsianWidth.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/EastAsianWidth.txt
+       cp /usr/share/unicode/extracted/DerivedEastAsianWidth.txt $@
 
 GraphemeBreakProperty.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/auxiliary/GraphemeBreakProperty.txt
+       cp /usr/share/unicode/auxiliary/GraphemeBreakProperty.txt $@
 
 DerivedCoreProperties.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/DerivedCoreProperties.txt
+       cp /usr/share/unicode/DerivedCoreProperties.txt $@
 
 CompositionExclusions.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/CompositionExclusions.txt
+       cp /usr/share/unicode/CompositionExclusions.txt $@
 
 CaseFolding.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/CaseFolding.txt
+       cp /usr/share/unicode/CaseFolding.txt $@
 
 NormalizationTest.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/NormalizationTest.txt
+       bzip2 -d < /usr/share/unicode/NormalizationTest.txt.bz2 > $@
 
 GraphemeBreakTest.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/auxiliary/GraphemeBreakTest.txt
+       cp /usr/share/unicode/auxiliary/GraphemeBreakTest.txt $@
 
 emoji-data.txt:
-       $(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://unicode.org/Public/$(UNICODE_VERSION)/ucd/emoji/emoji-data.txt
+       cp /usr/share/unicode/emoji/emoji-data.txt $@
 
 Uppercase.txt: DerivedCoreProperties.txt
-       $(JULIA) -e 'print(match(r"# Derived Property: Uppercase.*?# Total code points:"s, read("DerivedCoreProperties.txt", String)).match)' > $@
+       grep -zoP '(?s)# Derived Property: Uppercase.*?# Total code points:' DerivedCoreProperties.txt > $@
 
 Lowercase.txt: DerivedCoreProperties.txt
-       $(JULIA) -e 'print(match(r"# Derived Property: Lowercase.*?# Total code points:"s, read("DerivedCoreProperties.txt", String)).match)' > $@
+       grep -zoP '(?s)# Derived Property: Lowercase.*?# Total code points:' DerivedCoreProperties.txt > $@
 
 clean:
        rm -f $(RAWDATA) NormalizationTest.txt GraphemeBreakTest.txt